rm(list = ls())

library(data.table)
library(estimatr)

add_backticks = function(x) {
  paste0("`", x, "`")
}

x_lm_formula = function(x) {
  paste(add_backticks(x), collapse = " + ")
}


load('./data/panel_month_dummies_all_2020_months.RData')
panel_all[,covid2:=ifelse(month>'2020-01-01', 1,0)]
panel_all[,covid_death:=covid2*excess_deaths_jan_d]
panel_all[is.na(extr_right_mayor), extr_right_mayor:=0]

month_cols <-  grep('month_2', colnames(panel_all), value=TRUE)

panel_all[,less_college:=(100-educ_diplBA)]
panel_all[,(paste('educ',month_cols,sep = '_')):= lapply(.SD, function(x) 
  x * panel_all[['less_college']] ), .SDcols = month_cols]

panel_all[,(paste('foreign',month_cols,sep = '_')):= lapply(.SD, function(x) 
  x * panel_all[['foreign_pop']] ), .SDcols = month_cols]

panel_all[,(paste('old',month_cols,sep = '_')):= lapply(.SD, function(x) 
  x * panel_all[['above75_share']] ), .SDcols = month_cols]

panel_all[,(paste('localgov',month_cols,sep = '_')):= lapply(.SD, function(x) 
  x * panel_all[['extr_right_mayor']] ), .SDcols = month_cols]

educ_cols <-  grep('educ_month', colnames(panel_all), value=TRUE)
educ_cols <- educ_cols[-157]
foreign_cols <- grep('foreign_month', colnames(panel_all), value=TRUE)
foreign_cols <- foreign_cols[-157]
old_cols <- grep('old_month', colnames(panel_all), value=TRUE)
old_cols <- old_cols[-157]
gov_cols <- grep('localgov_month', colnames(panel_all), value=TRUE)
gov_cols <- gov_cols[-157]


flex_controls <- c(educ_cols, foreign_cols, old_cols, gov_cols)

panel_all[,time:= as.numeric(round((month-as.Date('2020-01-01',format='%Y-%m-%d'))/(365.25/12)))]

province_cols <- grep('code_province_', colnames(panel_all), value=TRUE)
panel_all[,(paste('trend',province_cols,sep = '_')):= lapply(.SD, function(x) 
  x * panel_all[['time']] ), .SDcols = province_cols]
trend_cols <- grep('trend_code_province', colnames(panel_all), value=TRUE)
trend_cols <- trend_cols[-1]

out_death_jan <- lm_robust(hc_pc_asians ~ covid_death, data=panel_all, se_type='stata',
                           clusters = panelvar, fixed_effects = ~ panelvar + month)
save(out_death_jan, file = './output/out_death_jan_2020_all.RData')
rm(out_death_jan)

formula_flex_controls <- as.formula(paste("hc_pc_asians ~ covid_death +", x_lm_formula(flex_controls)))

out_death_jan_con <- lm_robust(formula = formula_flex_controls,
                               data=panel_all, se_type='stata',
                               clusters = panelvar, fixed_effects = ~ panelvar + month)

save(out_death_jan_con, file = './output/out_death_jan_con_2020_all.RData')

rm(out_death_jan_con)

panel_all[,trend_death:=time*excess_deaths_jan_d]

formula_flex_controls_trend <- as.formula(paste("hc_pc_asians ~ covid_death + trend_death +", x_lm_formula(flex_controls)))

out_death_jan_con_trend <- lm_robust(formula = formula_flex_controls_trend,
                                     data=panel_all, se_type='stata',
                                     clusters = panelvar, fixed_effects = ~ panelvar + month)

save(out_death_jan_con_trend, file = './output/out_death_jan_con_trend_2020_all.RData')

rm(out_death_jan_con_trend)

flex_controls <- c(educ_cols, foreign_cols, old_cols, trend_cols)

formula_flex_controls <- as.formula(paste("hc_pc_asians ~ covid_death + trend_death +", x_lm_formula(flex_controls)))

out_death_jan_con_trend_all <- lm_robust(formula = formula_flex_controls,
                                         data=panel_all, se_type='stata',
                                         clusters = panelvar, fixed_effects = ~ panelvar + month)

save(out_death_jan_con_trend_all, file = './output/out_death_jan_con_trend_all_2020_all.RData')
